\relax 
\ifx\hyper@anchor\@undefined
\global \let \oldcontentsline\contentsline
\gdef \contentsline#1#2#3#4{\oldcontentsline{#1}{#2}{#3}}
\global \let \oldnewlabel\newlabel
\gdef \newlabel#1#2{\newlabelxx{#1}#2}
\gdef \newlabelxx#1#2#3#4#5#6{\oldnewlabel{#1}{{#2}{#3}}}
\AtEndDocument{\let \contentsline\oldcontentsline
\let \newlabel\oldnewlabel}
\else
\global \let \hyper@last\relax 
\fi

\@writefile{toc}{\contentsline {section}{\numberline {1}Introduction}{1}{section.1}}
\@writefile{toc}{\contentsline {subsection}{\numberline {1.1}The problem}{1}{subsection.1.1}}
\citation{dayan1993feudal}
\citation{mataric1997behaviour}
\citation{sutton1998reinforcement}
\@writefile{toc}{\contentsline {subsection}{\numberline {1.2}Our approach}{2}{subsection.1.2}}
\@writefile{toc}{\contentsline {subsubsection}{\numberline {1.2.1}A Learning Approach}{2}{subsubsection.1.2.1}}
\@writefile{toc}{\contentsline {subsubsection}{\numberline {1.2.2}Lower-level control systems}{2}{subsubsection.1.2.2}}
\@writefile{toc}{\contentsline {section}{\numberline {2}Representation}{2}{section.2}}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.1}The environment}{2}{subsection.2.1}}
\@writefile{lof}{\contentsline {figure}{\numberline {1}{\ignorespaces Grid-representation of entire room.}}{3}{figure.1}}
\newlabel{fig:neighborcells}{{1}{3}{Grid-representation of entire room}{figure.1}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.2}Grid size and the curse of dimensionality}{3}{subsection.2.2}}
\citation{sutton1999between}
\citation{busoniu2008comprehensive}
\@writefile{toc}{\contentsline {section}{\numberline {3}Learning to clean a room}{4}{section.3}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.1}Actions and Options}{4}{subsection.3.1}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.2}Multiagent Problem}{4}{subsection.3.2}}
\citation{oliehoek2010decision}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.3}Partial Observability}{5}{subsection.3.3}}
\@writefile{lof}{\contentsline {figure}{\numberline {2}{\ignorespaces Grid cells the agent can observe}}{5}{figure.2}}
\newlabel{fig:neighborcells}{{2}{5}{Grid cells the agent can observe\relax }{figure.2}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.4}Generalization}{6}{subsection.3.4}}
\@writefile{toc}{\contentsline {section}{\numberline {4}Results}{6}{section.4}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.1}Online vs Offline learning}{6}{subsection.4.1}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.2}The value of teamwork}{6}{subsection.4.2}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.3}Grid Size}{6}{subsection.4.3}}
\@writefile{lof}{\contentsline {figure}{\numberline {3}{\ignorespaces Comparison of state space size during online learning on a 5x5 grid.}}{7}{figure.3}}
\newlabel{fig:states5x5}{{3}{7}{Comparison of state space size during online learning on a 5x5 grid}{figure.3}{}}
\@writefile{lof}{\contentsline {figure}{\numberline {4}{\ignorespaces State space size during offline learning on a 3x3 grid for one agent}}{7}{figure.4}}
\newlabel{fig:states3x3-1ag}{{4}{7}{State space size during offline learning on a 3x3 grid for one agent\relax }{figure.4}{}}
\citation{evolutionairvoordeel}
\@writefile{lof}{\contentsline {figure}{\numberline {5}{\ignorespaces State space size for various experiments.}}{8}{figure.5}}
\newlabel{fig:statesGilles}{{5}{8}{State space size for various experiments}{figure.5}{}}
\@writefile{lof}{\contentsline {figure}{\numberline {6}{\ignorespaces Comparison of several settings on a 3x3 grid.}}{8}{figure.6}}
\newlabel{fig:comparison}{{6}{8}{Comparison of several settings on a 3x3 grid}{figure.6}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.4}Comparison to planning approach}{8}{subsection.4.4}}
\citation{tesauro1995temporal}
\citation{koppejan2009neuroevolutionary}
\citation{whiteson2011protecting}
\citation{busoniu2008comprehensive}
\citation{oliehoek2010decision}
\@writefile{lof}{\contentsline {figure}{\numberline {7}{\ignorespaces Offline learning process of 3 agents on a 3x3 grid cleaning 20 crumbs, with coordination of their moves}}{9}{figure.7}}
\newlabel{fig:coord}{{7}{9}{Offline learning process of 3 agents on a 3x3 grid cleaning 20 crumbs, with coordination of their moves\relax }{figure.7}{}}
\@writefile{lof}{\contentsline {figure}{\numberline {8}{\ignorespaces Offline learning process of 3 agents on a 3x3 grid cleaning 20 crumbs, without coordination of their moves}}{9}{figure.8}}
\newlabel{fig:nocoord}{{8}{9}{Offline learning process of 3 agents on a 3x3 grid cleaning 20 crumbs, without coordination of their moves\relax }{figure.8}{}}
\@writefile{lof}{\contentsline {figure}{\numberline {9}{\ignorespaces Online learning process of 3 agents on a 3x3 grid, with a linear fit.}}{10}{figure.9}}
\newlabel{fig:3x3random}{{9}{10}{Online learning process of 3 agents on a 3x3 grid, with a linear fit}{figure.9}{}}
\@writefile{toc}{\contentsline {section}{\numberline {5}Discussion \& Future Work}{10}{section.5}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.1}Scalability}{10}{subsection.5.1}}
\bibstyle{IEEEtran}
\bibdata{refs}
\bibcite{dayan1993feudal}{1}
\bibcite{mataric1997behaviour}{2}
\bibcite{sutton1998reinforcement}{3}
\bibcite{sutton1999between}{4}
\bibcite{busoniu2008comprehensive}{5}
\bibcite{oliehoek2010decision}{6}
\bibcite{evolutionairvoordeel}{7}
\bibcite{tesauro1995temporal}{8}
\bibcite{koppejan2009neuroevolutionary}{9}
\bibcite{whiteson2011protecting}{10}
